vllm serve /root/.cache/modelscope/hub/models/Qwen/Qwen3-4B --port 8000 --enable-auto-tool-choice --tool-call-parser hermes